VQA Samples for Selected IDs (81, 9678, 1037, 3669, 10016, 1560)
ID #81
{
"id": "81",
"image": "/Users/xjh/Desktop/UTS/Research/Dataset/RSVL-VQA/INRIA-Aerial-Image-Labeling/train/images/kitsap25.tif",
"vqa_pairs": [
{
"question_id": "1",
"question_type": "spatial",
"question": "Where is the residential area located in relation to the industrial port facility?",
"answer": "The residential area is located to the north of the industrial port facility."
},
{
"question_id": "2",
"question_type": "spatial",
"question": "What feature extends from the industrial port facility into the water?",
"answer": "Long piers extend from the industrial port facility into the water."
},
{
"question_id": "3",
"question_type": "spatial",
"question": "Where is the green space or park situated within the image?",
"answer": "The green space or park is situated within the residential area to the north of the industrial port facility."
},
{
"question_id": "4",
"question_type": "object",
"question": "What types of vessels are moored alongside the piers?",
"answer": "Ships are moored alongside the long piers."
},
{
"question_id": "5",
"question_type": "overall",
"question": "What type of area is shown in the image?",
"answer": "The image shows a coastal area with an industrial port facility along the shoreline and a residential area to the north."
},
{
"question_id": "6",
"question_type": "overall",
"question": "What are the main features of the landscape in the image?",
"answer": "The main features include an industrial port with piers and ships, a residential neighborhood with a grid street pattern, green spaces including a park, and open water with visible wake patterns."
},
{
"question_id": "7",
"question_type": "count",
"question": "How many buildings are there in the image?",
"answer": "There are 716 buildings in the image."
},
{
"question_id": "8",
"question_type": "presence",
"question": "Are there any buildings in the image?",
"answer": "Yes, there are 716 buildings."
},
{
"question_id": "9",
"question_type": "caption",
"question": "Generate a detailed caption for this image.",
"answer": "The image is dominated by an extensive industrial port facility along the shoreline, featuring many large rectangular buildings and warehouses, as well as several long piers extending into the water with ships moored alongside. To the north, there is a clear transition to a residential area with smaller houses and a grid-like street pattern, as well as a sizable green space or park with trees and pathways. The lower portion of the image is open water, with visible wake patterns and barriers. The built environment, including the port infrastructure and residential area, makes up a substantial but not overwhelming portion of the landscape, consistent with a moderate presence of buildings but also significant open and green areas."
}
],
"tags": [
"coastal area",
"industrial port",
"docks",
"large buildings",
"warehouses",
"piers",
"ships",
"urban neighborhood",
"residential houses",
"grid street pattern",
"green spaces",
"park",
"trees",
"pathways",
"open water",
"wake patterns",
"water barriers"
],
"relations": [
{
"object1": "industrial port facility",
"relation": "along",
"object2": "shoreline"
},
{
"object1": "long piers",
"relation": "extending into",
"object2": "water"
},
{
"object1": "ships",
"relation": "moored alongside",
"object2": "long piers"
},
{
"object1": "residential area",
"relation": "to the north",
"object2": "industrial port facility"
},
{
"object1": "green space or park",
"relation": "within",
"object2": "residential area"
},
{
"object1": "open water",
"relation": "in",
"object2": "lower portion of the image"
}
]
}
ID #1037
{
"id": "1037",
"image": "/Users/xjh/Desktop/UTS/Research/Dataset/RSVL-VQA/iSAID/train/train/images/P1779.png",
"vqa_pairs": [
{
"question_id": "1",
"question_type": "spatial",
"question": "Where is the warehouse structure located within the image frame?",
"answer": "The warehouse structure occupies the lower part of the frame."
},
{
"question_id": "2",
"question_type": "spatial",
"question": "What is situated at the upper and right edges of the image?",
"answer": "Roadways and small green patches with scattered trees are situated at the upper and right edges of the image."
},
{
"question_id": "3",
"question_type": "spatial",
"question": "What surrounds the warehouse structure in the image?",
"answer": "Paved areas surround the warehouse structure."
},
{
"question_id": "4",
"question_type": "object",
"question": "What kind of building is prominently featured in the image?",
"answer": "A large warehouse building is prominently featured."
},
{
"question_id": "5",
"question_type": "overall",
"question": "What type of area does the image depict?",
"answer": "The image depicts an industrial or commercial site focused on logistics and distribution operations."
},
{
"question_id": "6",
"question_type": "overall",
"question": "What is the dominant type of surface in the image?",
"answer": "Impervious surfaces such as paved areas and parking lots dominate the image."
},
{
"question_id": "7",
"question_type": "count",
"question": "How many large vehicles are there in the image?",
"answer": "There are 31 large vehicles in the image."
},
{
"question_id": "8",
"question_type": "presence",
"question": "Are there any large vehicles in the image?",
"answer": "Yes, there are 31 large vehicles."
},
{
"question_id": "9",
"question_type": "comparison",
"question": "Are there more large vehicles or small vehicles in the image?",
"answer": "There are more large vehicles (31) than small vehicles (4)."
},
{
"question_id": "10",
"question_type": "count",
"question": "How many small vehicles are there in the image?",
"answer": "There are 4 small vehicles in the image."
},
{
"question_id": "11",
"question_type": "presence",
"question": "Are there any small vehicles in the image?",
"answer": "Yes, there are 4 small vehicles."
},
{
"question_id": "12",
"question_type": "total_count",
"question": "What is the total number of objects in the image?",
"answer": "There are a total of 35 objects in the image, consisting of 31 large vehicles, 4 small vehicles."
},
{
"question_id": "13",
"question_type": "caption",
"question": "Generate a detailed caption for this image.",
"answer": "The image predominantly features an industrial or commercial site, with a large warehouse structure occupying the lower part of the frame. Surrounding the warehouse are extensive paved areas used for parking and maneuvering, with many trucks and trailers neatly lined up in rows, indicating active logistics or distribution operations. The upper and right edges of the image show roadways providing access to the facility, with some small green patches and scattered trees adding minimal vegetation to the otherwise built-up landscape. The overall scene is dominated by impervious surfaces and vehicles, with only a small portion of natural land cover visible."
}
],
"tags": [
"industrial facility",
"warehouse building",
"parked trucks",
"paved areas",
"parking lot",
"roadways",
"greenery",
"trees",
"impervious surfaces",
"logistics operations"
],
"relations": [
{
"object1": "warehouse structure",
"relation": "occupies",
"object2": "lower part of the frame"
},
{
"object1": "paved areas",
"relation": "surround",
"object2": "warehouse"
},
{
"object1": "trucks and trailers",
"relation": "lined up in rows on",
"object2": "paved areas"
},
{
"object1": "roadways",
"relation": "are at",
"object2": "upper and right edges of the image"
},
{
"object1": "roadways",
"relation": "provide access to",
"object2": "facility"
},
{
"object1": "small green patches and scattered trees",
"relation": "are at",
"object2": "upper and right edges of the image"
},
{
"object1": "small green patches and scattered trees",
"relation": "add",
"object2": "minimal vegetation to the landscape"
}
]
}
ID #1560
{
"id": "1560",
"image": "/Users/xjh/Desktop/UTS/Research/Dataset/RSVL-VQA/iSAID/train/train/images/P2797.png",
"vqa_pairs": [
{
"question_id": "1",
"question_type": "spatial",
"question": "Where are the parking lots located in the image?",
"answer": "The parking lots are located in the upper part of the image."
},
{
"question_id": "2",
"question_type": "spatial",
"question": "What is positioned along the left side of the image?",
"answer": "Small grassy areas are positioned along the left side of the image."
},
{
"question_id": "3",
"question_type": "spatial",
"question": "Where are the ground service vehicles and equipment in relation to the airplanes?",
"answer": "Ground service vehicles and equipment are attending the commercial airplanes parked at gates."
},
{
"question_id": "4",
"question_type": "objects",
"question": "What types of vehicles can be seen in the parking lots?",
"answer": "Cars and buses can be seen in the parking lots."
},
{
"question_id": "5",
"question_type": "overall",
"question": "What type of area is mainly shown in the image?",
"answer": "The image mainly shows an airport apron area."
},
{
"question_id": "6",
"question_type": "overall",
"question": "Is the scene dominated more by natural or built infrastructure?",
"answer": "The scene is dominated more by built infrastructure."
},
{
"question_id": "7",
"question_type": "quantity_or_proportion",
"question": "Do the grassy areas occupy a large or small portion of the landscape?",
"answer": "The grassy areas occupy only a minor portion of the landscape."
},
{
"question_id": "8",
"question_type": "count",
"question": "How many large vehicles are there in the image?",
"answer": "There are 3 large vehicles in the image."
},
{
"question_id": "9",
"question_type": "presence",
"question": "Are there any large vehicles in the image?",
"answer": "Yes, there are 3 large vehicles."
},
{
"question_id": "10",
"question_type": "comparison",
"question": "Are there more large vehicles or small vehicles in the image?",
"answer": "There are more small vehicles (8) than large vehicles (3)."
},
{
"question_id": "11",
"question_type": "count",
"question": "How many small vehicles are there in the image?",
"answer": "There are 8 small vehicles in the image."
},
{
"question_id": "12",
"question_type": "presence",
"question": "Are there any small vehicles in the image?",
"answer": "Yes, there are 8 small vehicles."
},
{
"question_id": "13",
"question_type": "count",
"question": "How many planes are there in the image?",
"answer": "There are 4 planes in the image."
},
{
"question_id": "14",
"question_type": "presence",
"question": "Are there any planes in the image?",
"answer": "Yes, there are 4 planes."
},
{
"question_id": "15",
"question_type": "total_count",
"question": "What is the total number of objects in the image?",
"answer": "There are a total of 15 objects in the image, consisting of 3 large vehicles, 8 small vehicles, 4 planes."
},
{
"question_id": "16",
"question_type": "caption",
"question": "Generate a detailed caption for this image.",
"answer": "The image predominantly displays an airport apron, characterized by a vast concrete surface where several commercial airplanes are parked at gates, each attended by various ground service vehicles and equipment. The upper part of the image contains parking lots with cars and buses, as well as roadways facilitating airport traffic. Small grassy areas are visible along the left side, but they occupy only a minor portion of the landscape. Overall, the scene is dominated by built infrastructure, with aviation operations and support activities clearly visible, and only minimal natural land cover present."
}
],
"tags": [
"airport apron",
"airplanes",
"gates",
"concrete surface",
"service vehicles",
"ground support equipment",
"parking lots",
"cars",
"buses",
"roadways",
"grass patches"
],
"relations": [
{
"object1": "commercial airplanes",
"relation": "parked at",
"object2": "gates"
},
{
"object1": "ground service vehicles and equipment",
"relation": "attend",
"object2": "commercial airplanes"
},
{
"object1": "parking lots",
"relation": "located in",
"object2": "upper part of the image"
},
{
"object1": "cars and buses",
"relation": "in",
"object2": "parking lots"
},
{
"object1": "roadways",
"relation": "in",
"object2": "upper part of the image"
},
{
"object1": "small grassy areas",
"relation": "along",
"object2": "left side"
},
{
"object1": "small grassy areas",
"relation": "occupy",
"object2": "minor portion of the landscape"
}
]
}
ID #3669
{
"id": "3669",
"image": "/Users/xjh/Desktop/UTS/Research/Dataset/RSVL-VQA/LoveDA/test/Test/Urban/images_png/5812.png",
"vqa_pairs": [
{
"question_id": "1",
"question_type": "spatial",
"question": "Where are the industrial or warehouse structures located in the image?",
"answer": "They are occupying the central and southern areas of the image."
},
{
"question_id": "2",
"question_type": "spatial",
"question": "What feature separates the industrial zone from the residential area?",
"answer": "A canal runs horizontally and separates the industrial zone from the residential area."
},
{
"question_id": "3",
"question_type": "spatial",
"question": "What crosses the canal to connect the industrial and residential areas?",
"answer": "A small bridge crosses the canal, indicating connectivity between the two sides."
},
{
"question_id": "4",
"question_type": "objects",
"question": "What types of buildings are found in the residential area?",
"answer": "The residential area has several apartment blocks."
},
{
"question_id": "5",
"question_type": "quantity",
"question": "Are paved surfaces mainly adjacent to industrial buildings or residential complexes?",
"answer": "Paved surfaces, including roads and parking lots, are mostly adjacent to the industrial buildings."
},
{
"question_id": "6",
"question_type": "caption",
"question": "Generate a detailed caption for this image.",
"answer": "The image is dominated by industrial or warehouse structures with distinct red and blue rooftops, occupying much of the central and southern areas. Above these buildings, a canal runs horizontally, separating the industrial zone from a residential area with several apartment blocks. The canal is crossed by a small bridge, indicating connectivity between the two sides. There are paved surfaces, including roads and parking lots, mostly adjacent to the industrial buildings. In the upper right and left corners, there are patches of green or overgrown land, with the upper left area possibly being an orchard, garden, or cemetery due to its grid-like pattern. Overall, the landscape is a blend of built-up industrial, residential, and some green/vacant spaces, with clear separation by the canal."
}
],
"tags": [
"industrial buildings",
"warehouse structures",
"red rooftops",
"blue rooftops",
"canal",
"bridge",
"residential complexes",
"apartment blocks",
"roads",
"parking lots",
"vegetated land",
"vacant land",
"orchard",
"garden",
"cemetery",
"paved surfaces",
"green patches"
],
"relations": [
{
"object1": "industrial or warehouse structures",
"relation": "occupying",
"object2": "central and southern areas"
},
{
"object1": "canal",
"relation": "runs above",
"object2": "industrial or warehouse structures"
},
{
"object1": "canal",
"relation": "separates",
"object2": "industrial zone and residential area"
},
{
"object1": "residential area",
"relation": "has",
"object2": "several apartment blocks"
},
{
"object1": "small bridge",
"relation": "crosses",
"object2": "canal"
},
{
"object1": "paved surfaces",
"relation": "are adjacent to",
"object2": "industrial buildings"
},
{
"object1": "patches of green or overgrown land",
"relation": "are in",
"object2": "upper right and left corners"
},
{
"object1": "upper left area",
"relation": "possibly is",
"object2": "orchard, garden, or cemetery"
},
{
"object1": "canal",
"relation": "separates",
"object2": "built-up industrial, residential, and green/vacant spaces"
}
]
}
ID #9678
{
"id": "9678",
"image": "/Users/xjh/Desktop/UTS/Research/Dataset/RSVL-VQA/WHU/test/test/310207.TIF",
"vqa_pairs": [
{
"question_id": "1",
"question_type": "spatial",
"question": "Where are the large buildings located within the image?",
"answer": "The large buildings are located in the southeastern quadrant of the image."
},
{
"question_id": "2",
"question_type": "spatial",
"question": "Which parts of the image are dominated by open grassy land?",
"answer": "The central and northern parts of the image are dominated by open grassy land."
},
{
"question_id": "3",
"question_type": "spatial",
"question": "Where are the paved roads situated around the site?",
"answer": "The paved roads border the site to the north and east."
},
{
"question_id": "4",
"question_type": "object",
"question": "What kind of scattered objects are found in the western section of the image?",
"answer": "Scattered objects and debris related to industrial or construction activity are found in the western section."
},
{
"question_id": "5",
"question_type": "overall",
"question": "What type of area is primarily depicted in the image?",
"answer": "The image primarily depicts a developed industrial or commercial area."
},
{
"question_id": "6",
"question_type": "overall",
"question": "How would you describe the land coverage in the image?",
"answer": "Much of the land is open grassy or disturbed soil, with substantial building coverage mainly in the southeastern quadrant."
},
{
"question_id": "7",
"question_type": "quantity",
"question": "Are the large buildings concentrated or scattered throughout the site?",
"answer": "The large buildings are concentrated in a cluster in the southeastern quadrant."
},
{
"question_id": "8",
"question_type": "count",
"question": "How many buildings are there in the image?",
"answer": "There are 7 buildings in the image."
},
{
"question_id": "9",
"question_type": "presence",
"question": "Are there any buildings in the image?",
"answer": "Yes, there are 7 buildings."
},
{
"question_id": "10",
"question_type": "caption",
"question": "Generate a detailed caption for this image.",
"answer": "The image primarily depicts a developed industrial or commercial area, with a cluster of large buildings occupying a significant portion of the southeastern quadrant. The central and northern parts of the image are dominated by open grassy land, interspersed with patches of bare or disturbed soil, likely due to construction or industrial activity. Paved roads border the site to the north and east, providing access to the area. There are also some scattered objects and debris, particularly in the western section, which may be related to ongoing or past industrial processes. Overall, the image confirms the presence of substantial building coverage, but much of the land is open or disturbed rather than built-up."
}
],
"tags": [
"industrial site",
"commercial site",
"large buildings",
"open grassy areas",
"bare soil",
"disturbed soil",
"paved roads",
"scattered debris",
"construction activity"
],
"relations": [
{
"object1": "cluster of large buildings",
"relation": "occupying",
"object2": "southeastern quadrant"
},
{
"object1": "central and northern parts of the image",
"relation": "dominated by",
"object2": "open grassy land"
},
{
"object1": "open grassy land",
"relation": "interspersed with",
"object2": "patches of bare or disturbed soil"
},
{
"object1": "paved roads",
"relation": "border",
"object2": "site to the north and east"
},
{
"object1": "scattered objects and debris",
"relation": "located in",
"object2": "western section"
}
]
}
ID #10016
{
"id": "10016",
"image": "/Users/xjh/Desktop/UTS/Research/Dataset/RSVL-VQA/WHU/test/test/310545.TIF",
"vqa_pairs": [
{
"question_id": "1",
"question_type": "spatial",
"question": "Where are the buildings located in the image?",
"answer": "The buildings are located in the right-central area of the image."
},
{
"question_id": "2",
"question_type": "spatial",
"question": "What natural features surround the buildings and structures?",
"answer": "The buildings and structures are surrounded by dense tree cover and some landscaped areas."
},
{
"question_id": "3",
"question_type": "spatial",
"question": "Where is the road located in the image?",
"answer": "The road is located at the bottom of the image."
},
{
"question_id": "4",
"question_type": "overall",
"question": "What type of landscape is depicted in the image?",
"answer": "The image depicts a predominantly rural and open landscape."
},
{
"question_id": "5",
"question_type": "overall",
"question": "How would you describe the distribution of natural versus built-up areas in the scene?",
"answer": "Natural areas dominate the scene with expansive grassy fields and tree cover, while built-up features are limited to a compact section."
},
{
"question_id": "6",
"question_type": "quantity",
"question": "Are the built-up features spread throughout the image or confined to a specific area?",
"answer": "The built-up features are confined to a compact section in the right-central area."
},
{
"question_id": "7",
"question_type": "count",
"question": "How many buildings are there in the image?",
"answer": "There are 8 buildings in the image."
},
{
"question_id": "8",
"question_type": "presence",
"question": "Are there any buildings in the image?",
"answer": "Yes, there are 8 buildings."
},
{
"question_id": "9",
"question_type": "caption",
"question": "Generate a detailed caption for this image.",
"answer": "The image primarily consists of expansive grassy fields, with the majority of the land cover being open and undeveloped. A small portion of the image, particularly in the right-central area, contains several buildings and associated structures, which are surrounded by dense tree cover and some landscaped areas. The buildings occupy only a minor fraction of the overall scene, consistent with the description of a small percentage of building cover. Tree lines and clusters provide natural boundaries and shade, while the road at the bottom suggests access to the property. Overall, the landscape is predominantly rural and open, with built-up features limited to a compact section."
}
],
"tags": [
"open grassy fields",
"clusters of trees",
"buildings",
"structures",
"road",
"tree lines",
"landscaped areas",
"rural landscape"
],
"relations": [
{
"object1": "several buildings and associated structures",
"relation": "in",
"object2": "right-central area"
},
{
"object1": "several buildings and associated structures",
"relation": "surrounded by",
"object2": "dense tree cover and some landscaped areas"
},
{
"object1": "road",
"relation": "at",
"object2": "bottom"
},
{
"object1": "built-up features",
"relation": "limited to",
"object2": "compact section"
}
]
}